See تتا on Wiktionary
{ "etymology_number": 1, "etymology_templates": [ { "args": { "1": "pa", "2": "ine-pro", "3": "*tep-" }, "expansion": "", "name": "root" }, { "args": { "1": "pa", "2": "sa", "3": "तप्" }, "expansion": "", "name": "root" }, { "args": { "1": "Inherited" }, "expansion": "Inherited", "name": "glossary" }, { "args": { "1": "pa", "2": "pra", "3": "𑀢𑀢𑁆𑀢", "4": "", "5": "", "g": "", "g2": "", "g3": "", "id": "", "lit": "", "nocat": "", "pos": "", "sc": "", "sort": "", "tr": "", "ts": "" }, "expansion": "Prakrit 𑀢𑀢𑁆𑀢 (tatta)", "name": "inh" }, { "args": { "1": "pa", "2": "pra", "3": "𑀢𑀢𑁆𑀢" }, "expansion": "Inherited from Prakrit 𑀢𑀢𑁆𑀢 (tatta)", "name": "inh+" }, { "args": { "1": "pa", "2": "sa", "3": "तप्त", "tr": "taptá" }, "expansion": "Sanskrit तप्त (taptá)", "name": "inh" }, { "args": { "1": "pa", "2": "ine-pro", "3": "*tep-", "4": "", "5": "to be hot, warm" }, "expansion": "Proto-Indo-European *tep- (“to be hot, warm”)", "name": "inh" } ], "etymology_text": "Inherited from Prakrit 𑀢𑀢𑁆𑀢 (tatta), from Sanskrit तप्त (taptá), ultimately from Proto-Indo-European *tep- (“to be hot, warm”).", "forms": [ { "form": "تَتّا", "tags": [ "canonical" ] }, { "form": "tattā", "tags": [ "romanization" ] }, { "form": "ਤੱਤਾ", "tags": [ "Gurmukhi" ] }, { "form": "no-table-tags", "source": "declension", "tags": [ "table-tags" ] }, { "form": "pnb-decl-adj", "source": "declension", "tags": [ "inflection-template" ] }, { "form": "تَتّا", "roman": "tattā", "source": "declension", "tags": [ "direct", "masculine", "singular" ] }, { "form": "تَتّے", "roman": "tatte", "source": "declension", "tags": [ "direct", "masculine", "plural" ] }, { "form": "تَتّی", "roman": "tattī", "source": "declension", "tags": [ "direct", "feminine", "singular" ] }, { "form": "تَتِّیاں", "roman": "tattiyāṉ", "source": "declension", "tags": [ "direct", "feminine", "plural" ] }, { "form": "تَتّے", "roman": "tatte", "source": "declension", "tags": [ "masculine", "oblique", "singular" ] }, { "form": "تَتّیاں", "roman": "tatteyāṉ", "source": "declension", "tags": [ "masculine", "oblique", "plural" ] }, { "form": "تَتّی", "roman": "tattī", "source": "declension", "tags": [ "feminine", "oblique", "singular" ] }, { "form": "تَتِّیاں", "roman": "tattiyāṉ", "source": "declension", "tags": [ "feminine", "oblique", "plural" ] } ], "head_templates": [ { "args": { "gur": "ਤੱਤਾ", "head": "تَتّا" }, "expansion": "تَتّا • (tattā) (Gurmukhi spelling ਤੱਤਾ)", "name": "pa-adj" } ], "inflection_templates": [ { "args": { "1": "تَتّ", "2": "tatt" }, "name": "pnb-decl-adj" } ], "lang": "Punjabi", "lang_code": "pa", "pos": "adj", "related": [ { "_dis1": "0 0 0 0 0", "english": "to heat up; become hot, heated", "roman": "tappṇā", "tags": [ "verb" ], "word": "تَپّݨا" } ], "senses": [ { "glosses": [ "hot; warm" ], "id": "en-تتا-pa-adj-NTwicwW5", "links": [ [ "hot", "hot" ], [ "warm", "warm" ] ] }, { "categories": [ { "_dis": "0 37 0 2 37 25", "kind": "other", "name": "Pages with 2 entries", "parents": [], "source": "w+disamb" }, { "_dis": "0 38 0 1 38 23", "kind": "other", "name": "Pages with entries", "parents": [], "source": "w+disamb" }, { "_dis": "4 44 5 6 40", "kind": "other", "name": "Punjabi adjectives in Shahmukhi script", "parents": [], "source": "w+disamb" }, { "_dis": "1 37 2 2 36 22", "kind": "other", "name": "Punjabi entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "1 39 2 3 36 19", "kind": "other", "name": "Punjabi interjections in Shahmukhi script", "parents": [], "source": "w+disamb" }, { "_dis": "1 55 2 3 39", "kind": "other", "name": "Punjabi terms with redundant transliterations", "parents": [ "Terms with redundant transliterations", "Entry maintenance" ], "source": "w+disamb" } ], "glosses": [ "short-tempered; hotheaded" ], "id": "en-تتا-pa-adj-tJ9HfwOo", "links": [ [ "short-tempered", "short-tempered" ], [ "hotheaded", "hotheaded" ] ], "raw_glosses": [ "(figuratively) short-tempered; hotheaded" ], "tags": [ "figuratively" ] }, { "categories": [], "glosses": [ "brave; courageous" ], "id": "en-تتا-pa-adj-RtSpttq0", "links": [ [ "brave", "brave" ], [ "courageous", "courageous" ] ], "raw_glosses": [ "(figuratively, rare) brave; courageous" ], "tags": [ "figuratively", "rare" ] }, { "categories": [], "glosses": [ "stubborn, obstinate" ], "id": "en-تتا-pa-adj-weao9Wz5", "links": [ [ "stubborn", "stubborn" ], [ "obstinate", "obstinate" ] ], "raw_glosses": [ "(figuratively, rare) stubborn, obstinate" ], "tags": [ "figuratively", "rare" ] }, { "categories": [ { "_dis": "0 37 0 2 37 25", "kind": "other", "name": "Pages with 2 entries", "parents": [], "source": "w+disamb" }, { "_dis": "0 38 0 1 38 23", "kind": "other", "name": "Pages with entries", "parents": [], "source": "w+disamb" }, { "_dis": "4 44 5 6 40", "kind": "other", "name": "Punjabi adjectives in Shahmukhi script", "parents": [], "source": "w+disamb" }, { "_dis": "1 37 2 2 36 22", "kind": "other", "name": "Punjabi entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "1 39 2 3 36 19", "kind": "other", "name": "Punjabi interjections in Shahmukhi script", "parents": [], "source": "w+disamb" } ], "glosses": [ "ill-fated; unlucky" ], "id": "en-تتا-pa-adj-WUqrynIN", "links": [ [ "ill-fated", "ill-fated" ], [ "unlucky", "unlucky" ] ] } ], "sounds": [ { "ipa": "/t̪ət̪.t̪äː/", "note": "Standard Punjabi" }, { "rhymes": "-äː" } ], "word": "تتا" } { "etymology_number": 2, "forms": [ { "form": "تَتّا", "tags": [ "canonical" ] }, { "form": "tattā", "tags": [ "romanization" ] }, { "form": "ਤੱਤਾ", "tags": [ "Gurmukhi" ] } ], "head_templates": [ { "args": { "gur": "ਤੱਤਾ", "head": "تَتّا" }, "expansion": "تَتّا • (tattā) (Gurmukhi spelling ਤੱਤਾ)", "name": "pa-interj" } ], "lang": "Punjabi", "lang_code": "pa", "pos": "intj", "senses": [ { "categories": [ { "_dis": "0 37 0 2 37 25", "kind": "other", "name": "Pages with 2 entries", "parents": [], "source": "w+disamb" }, { "_dis": "0 38 0 1 38 23", "kind": "other", "name": "Pages with entries", "parents": [], "source": "w+disamb" }, { "_dis": "1 37 2 2 36 22", "kind": "other", "name": "Punjabi entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w+disamb" }, { "_dis": "1 39 2 3 36 19", "kind": "other", "name": "Punjabi interjections in Shahmukhi script", "parents": [], "source": "w+disamb" } ], "glosses": [ "Ploughman's call to bullocks to go slightly to the right." ], "id": "en-تتا-pa-intj--NxA3lTb", "links": [ [ "Ploughman", "ploughman" ], [ "bullocks", "bullocks" ] ] } ], "sounds": [ { "ipa": "/t̪ət̪.t̪äː/", "note": "Standard Punjabi" }, { "rhymes": "-äː" } ], "word": "تتا" } { "etymology_templates": [ { "args": { "1": "skr", "2": "ine-pro", "3": "*tep-" }, "expansion": "", "name": "root" }, { "args": { "1": "Inherited" }, "expansion": "Inherited", "name": "glossary" }, { "args": { "1": "skr", "2": "pra", "3": "𑀢𑀢𑁆𑀢", "4": "", "5": "", "g": "", "g2": "", "g3": "", "id": "", "lit": "", "nocat": "", "pos": "", "sc": "", "sort": "", "tr": "", "ts": "" }, "expansion": "Prakrit 𑀢𑀢𑁆𑀢 (tatta)", "name": "inh" }, { "args": { "1": "skr", "2": "pra", "3": "𑀢𑀢𑁆𑀢" }, "expansion": "Inherited from Prakrit 𑀢𑀢𑁆𑀢 (tatta)", "name": "inh+" }, { "args": { "1": "skr", "2": "sa", "3": "तप्त", "tr": "taptá" }, "expansion": "Sanskrit तप्त (taptá)", "name": "inh" }, { "args": { "1": "skr", "2": "ine-pro", "3": "*tep-", "4": "", "5": "to be hot, warm" }, "expansion": "Proto-Indo-European *tep- (“to be hot, warm”)", "name": "inh" } ], "etymology_text": "Inherited from Prakrit 𑀢𑀢𑁆𑀢 (tatta), from Sanskrit तप्त (taptá), ultimately from Proto-Indo-European *tep- (“to be hot, warm”).", "forms": [ { "form": "تَتّا", "tags": [ "canonical", "masculine" ] }, { "form": "tattā", "tags": [ "romanization" ] }, { "form": "no-table-tags", "source": "declension", "tags": [ "table-tags" ] }, { "form": "skr-decl-adj", "source": "declension", "tags": [ "inflection-template" ] }, { "form": "تتا", "roman": "tattā", "source": "declension", "tags": [ "direct", "masculine", "singular" ] }, { "form": "تتے", "roman": "tatte", "source": "declension", "tags": [ "direct", "masculine", "plural" ] }, { "form": "تتی", "roman": "tattī", "source": "declension", "tags": [ "direct", "feminine", "singular" ] }, { "form": "تتِیاں", "roman": "tattīyā̃", "source": "declension", "tags": [ "direct", "feminine", "plural" ] }, { "form": "تتے", "roman": "tatte", "source": "declension", "tags": [ "masculine", "oblique", "singular" ] }, { "form": "تتیاں", "roman": "tatteyā̃", "source": "declension", "tags": [ "masculine", "oblique", "plural" ] }, { "form": "تتی", "roman": "tattī", "source": "declension", "tags": [ "feminine", "oblique", "singular" ] }, { "form": "تتِیاں", "roman": "tattīyā̃", "source": "declension", "tags": [ "feminine", "oblique", "plural" ] } ], "head_templates": [ { "args": { "1": "skr", "2": "adjective", "g": "m", "head": "تَتّا" }, "expansion": "تَتّا (tattā) m", "name": "head" } ], "inflection_templates": [ { "args": { "1": "تت", "2": "tatt" }, "name": "skr-decl-adj" } ], "lang": "Saraiki", "lang_code": "skr", "pos": "adj", "senses": [ { "categories": [ { "kind": "other", "name": "Pages with 2 entries", "parents": [], "source": "w" }, { "kind": "other", "name": "Pages with entries", "parents": [], "source": "w" }, { "kind": "other", "name": "Sanskrit terms with non-redundant manual transliterations", "parents": [ "Terms with non-redundant manual transliterations", "Entry maintenance" ], "source": "w" }, { "kind": "other", "name": "Saraiki entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w" }, { "kind": "other", "name": "Saraiki links with redundant wikilinks", "parents": [ "Links with redundant wikilinks", "Entry maintenance" ], "source": "w" }, { "kind": "other", "name": "Saraiki terms with non-redundant manual transliterations", "parents": [ "Terms with non-redundant manual transliterations", "Entry maintenance" ], "source": "w" } ], "glosses": [ "hot, heated, warm" ], "id": "en-تتا-skr-adj-oI15E7cY", "links": [ [ "hot", "hot" ], [ "heated", "heated" ], [ "warm", "warm" ] ] } ], "sounds": [ { "ipa": "/t̪ət̪.t̪aː/" }, { "rhymes": "-aː" } ], "word": "تتا" }
{ "categories": [ "Pages with 2 entries", "Pages with entries", "Punjabi adjectives", "Punjabi adjectives in Shahmukhi script", "Punjabi entries with incorrect language header", "Punjabi interjections", "Punjabi interjections in Shahmukhi script", "Punjabi lemmas", "Punjabi terms derived from Prakrit", "Punjabi terms derived from Proto-Indo-European", "Punjabi terms derived from Sanskrit", "Punjabi terms derived from the Proto-Indo-European root *tep-", "Punjabi terms derived from the Sanskrit root तप्", "Punjabi terms inherited from Prakrit", "Punjabi terms inherited from Proto-Indo-European", "Punjabi terms inherited from Sanskrit", "Punjabi terms with redundant transliterations", "Rhymes:Punjabi/äː", "Rhymes:Punjabi/äː/2 syllables" ], "etymology_number": 1, "etymology_templates": [ { "args": { "1": "pa", "2": "ine-pro", "3": "*tep-" }, "expansion": "", "name": "root" }, { "args": { "1": "pa", "2": "sa", "3": "तप्" }, "expansion": "", "name": "root" }, { "args": { "1": "Inherited" }, "expansion": "Inherited", "name": "glossary" }, { "args": { "1": "pa", "2": "pra", "3": "𑀢𑀢𑁆𑀢", "4": "", "5": "", "g": "", "g2": "", "g3": "", "id": "", "lit": "", "nocat": "", "pos": "", "sc": "", "sort": "", "tr": "", "ts": "" }, "expansion": "Prakrit 𑀢𑀢𑁆𑀢 (tatta)", "name": "inh" }, { "args": { "1": "pa", "2": "pra", "3": "𑀢𑀢𑁆𑀢" }, "expansion": "Inherited from Prakrit 𑀢𑀢𑁆𑀢 (tatta)", "name": "inh+" }, { "args": { "1": "pa", "2": "sa", "3": "तप्त", "tr": "taptá" }, "expansion": "Sanskrit तप्त (taptá)", "name": "inh" }, { "args": { "1": "pa", "2": "ine-pro", "3": "*tep-", "4": "", "5": "to be hot, warm" }, "expansion": "Proto-Indo-European *tep- (“to be hot, warm”)", "name": "inh" } ], "etymology_text": "Inherited from Prakrit 𑀢𑀢𑁆𑀢 (tatta), from Sanskrit तप्त (taptá), ultimately from Proto-Indo-European *tep- (“to be hot, warm”).", "forms": [ { "form": "تَتّا", "tags": [ "canonical" ] }, { "form": "tattā", "tags": [ "romanization" ] }, { "form": "ਤੱਤਾ", "tags": [ "Gurmukhi" ] }, { "form": "no-table-tags", "source": "declension", "tags": [ "table-tags" ] }, { "form": "pnb-decl-adj", "source": "declension", "tags": [ "inflection-template" ] }, { "form": "تَتّا", "roman": "tattā", "source": "declension", "tags": [ "direct", "masculine", "singular" ] }, { "form": "تَتّے", "roman": "tatte", "source": "declension", "tags": [ "direct", "masculine", "plural" ] }, { "form": "تَتّی", "roman": "tattī", "source": "declension", "tags": [ "direct", "feminine", "singular" ] }, { "form": "تَتِّیاں", "roman": "tattiyāṉ", "source": "declension", "tags": [ "direct", "feminine", "plural" ] }, { "form": "تَتّے", "roman": "tatte", "source": "declension", "tags": [ "masculine", "oblique", "singular" ] }, { "form": "تَتّیاں", "roman": "tatteyāṉ", "source": "declension", "tags": [ "masculine", "oblique", "plural" ] }, { "form": "تَتّی", "roman": "tattī", "source": "declension", "tags": [ "feminine", "oblique", "singular" ] }, { "form": "تَتِّیاں", "roman": "tattiyāṉ", "source": "declension", "tags": [ "feminine", "oblique", "plural" ] } ], "head_templates": [ { "args": { "gur": "ਤੱਤਾ", "head": "تَتّا" }, "expansion": "تَتّا • (tattā) (Gurmukhi spelling ਤੱਤਾ)", "name": "pa-adj" } ], "inflection_templates": [ { "args": { "1": "تَتّ", "2": "tatt" }, "name": "pnb-decl-adj" } ], "lang": "Punjabi", "lang_code": "pa", "pos": "adj", "related": [ { "english": "to heat up; become hot, heated", "roman": "tappṇā", "tags": [ "verb" ], "word": "تَپّݨا" } ], "senses": [ { "glosses": [ "hot; warm" ], "links": [ [ "hot", "hot" ], [ "warm", "warm" ] ] }, { "glosses": [ "short-tempered; hotheaded" ], "links": [ [ "short-tempered", "short-tempered" ], [ "hotheaded", "hotheaded" ] ], "raw_glosses": [ "(figuratively) short-tempered; hotheaded" ], "tags": [ "figuratively" ] }, { "categories": [ "Punjabi terms with rare senses" ], "glosses": [ "brave; courageous" ], "links": [ [ "brave", "brave" ], [ "courageous", "courageous" ] ], "raw_glosses": [ "(figuratively, rare) brave; courageous" ], "tags": [ "figuratively", "rare" ] }, { "categories": [ "Punjabi terms with rare senses" ], "glosses": [ "stubborn, obstinate" ], "links": [ [ "stubborn", "stubborn" ], [ "obstinate", "obstinate" ] ], "raw_glosses": [ "(figuratively, rare) stubborn, obstinate" ], "tags": [ "figuratively", "rare" ] }, { "glosses": [ "ill-fated; unlucky" ], "links": [ [ "ill-fated", "ill-fated" ], [ "unlucky", "unlucky" ] ] } ], "sounds": [ { "ipa": "/t̪ət̪.t̪äː/", "note": "Standard Punjabi" }, { "rhymes": "-äː" } ], "word": "تتا" } { "categories": [ "Pages with 2 entries", "Pages with entries", "Punjabi entries with incorrect language header", "Punjabi interjections", "Punjabi interjections in Shahmukhi script", "Punjabi lemmas", "Rhymes:Punjabi/äː", "Rhymes:Punjabi/äː/2 syllables" ], "etymology_number": 2, "forms": [ { "form": "تَتّا", "tags": [ "canonical" ] }, { "form": "tattā", "tags": [ "romanization" ] }, { "form": "ਤੱਤਾ", "tags": [ "Gurmukhi" ] } ], "head_templates": [ { "args": { "gur": "ਤੱਤਾ", "head": "تَتّا" }, "expansion": "تَتّا • (tattā) (Gurmukhi spelling ਤੱਤਾ)", "name": "pa-interj" } ], "lang": "Punjabi", "lang_code": "pa", "pos": "intj", "senses": [ { "glosses": [ "Ploughman's call to bullocks to go slightly to the right." ], "links": [ [ "Ploughman", "ploughman" ], [ "bullocks", "bullocks" ] ] } ], "sounds": [ { "ipa": "/t̪ət̪.t̪äː/", "note": "Standard Punjabi" }, { "rhymes": "-äː" } ], "word": "تتا" } { "etymology_templates": [ { "args": { "1": "skr", "2": "ine-pro", "3": "*tep-" }, "expansion": "", "name": "root" }, { "args": { "1": "Inherited" }, "expansion": "Inherited", "name": "glossary" }, { "args": { "1": "skr", "2": "pra", "3": "𑀢𑀢𑁆𑀢", "4": "", "5": "", "g": "", "g2": "", "g3": "", "id": "", "lit": "", "nocat": "", "pos": "", "sc": "", "sort": "", "tr": "", "ts": "" }, "expansion": "Prakrit 𑀢𑀢𑁆𑀢 (tatta)", "name": "inh" }, { "args": { "1": "skr", "2": "pra", "3": "𑀢𑀢𑁆𑀢" }, "expansion": "Inherited from Prakrit 𑀢𑀢𑁆𑀢 (tatta)", "name": "inh+" }, { "args": { "1": "skr", "2": "sa", "3": "तप्त", "tr": "taptá" }, "expansion": "Sanskrit तप्त (taptá)", "name": "inh" }, { "args": { "1": "skr", "2": "ine-pro", "3": "*tep-", "4": "", "5": "to be hot, warm" }, "expansion": "Proto-Indo-European *tep- (“to be hot, warm”)", "name": "inh" } ], "etymology_text": "Inherited from Prakrit 𑀢𑀢𑁆𑀢 (tatta), from Sanskrit तप्त (taptá), ultimately from Proto-Indo-European *tep- (“to be hot, warm”).", "forms": [ { "form": "تَتّا", "tags": [ "canonical", "masculine" ] }, { "form": "tattā", "tags": [ "romanization" ] }, { "form": "no-table-tags", "source": "declension", "tags": [ "table-tags" ] }, { "form": "skr-decl-adj", "source": "declension", "tags": [ "inflection-template" ] }, { "form": "تتا", "roman": "tattā", "source": "declension", "tags": [ "direct", "masculine", "singular" ] }, { "form": "تتے", "roman": "tatte", "source": "declension", "tags": [ "direct", "masculine", "plural" ] }, { "form": "تتی", "roman": "tattī", "source": "declension", "tags": [ "direct", "feminine", "singular" ] }, { "form": "تتِیاں", "roman": "tattīyā̃", "source": "declension", "tags": [ "direct", "feminine", "plural" ] }, { "form": "تتے", "roman": "tatte", "source": "declension", "tags": [ "masculine", "oblique", "singular" ] }, { "form": "تتیاں", "roman": "tatteyā̃", "source": "declension", "tags": [ "masculine", "oblique", "plural" ] }, { "form": "تتی", "roman": "tattī", "source": "declension", "tags": [ "feminine", "oblique", "singular" ] }, { "form": "تتِیاں", "roman": "tattīyā̃", "source": "declension", "tags": [ "feminine", "oblique", "plural" ] } ], "head_templates": [ { "args": { "1": "skr", "2": "adjective", "g": "m", "head": "تَتّا" }, "expansion": "تَتّا (tattā) m", "name": "head" } ], "inflection_templates": [ { "args": { "1": "تت", "2": "tatt" }, "name": "skr-decl-adj" } ], "lang": "Saraiki", "lang_code": "skr", "pos": "adj", "senses": [ { "categories": [ "Pages with 2 entries", "Pages with entries", "Rhymes:Saraiki/aː", "Rhymes:Saraiki/aː/2 syllables", "Sanskrit terms with non-redundant manual transliterations", "Saraiki adjectives", "Saraiki entries with incorrect language header", "Saraiki lemmas", "Saraiki links with redundant wikilinks", "Saraiki terms derived from Prakrit", "Saraiki terms derived from Proto-Indo-European", "Saraiki terms derived from Sanskrit", "Saraiki terms derived from the Proto-Indo-European root *tep-", "Saraiki terms inherited from Prakrit", "Saraiki terms inherited from Proto-Indo-European", "Saraiki terms inherited from Sanskrit", "Saraiki terms with non-redundant manual transliterations" ], "glosses": [ "hot, heated, warm" ], "links": [ [ "hot", "hot" ], [ "heated", "heated" ], [ "warm", "warm" ] ] } ], "sounds": [ { "ipa": "/t̪ət̪.t̪aː/" }, { "rhymes": "-aː" } ], "word": "تتا" }
Download raw JSONL data for تتا meaning in All languages combined (8.7kB)
This page is a part of the kaikki.org machine-readable All languages combined dictionary. This dictionary is based on structured data extracted on 2024-11-28 from the enwiktionary dump dated 2024-11-21 using wiktextract (65a6e81 and 0dbea76). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.
If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.